#ifndef CUFFTDX_FFT_30_FP16_FWD_PTX_HPP
#define CUFFTDX_FFT_30_FP16_FWD_PTX_HPP



template<> __forceinline__ __device__ void cufftdx_private_function<760, __half2, 1>(cufftdx::detail::complex<__half2> *rmem, unsigned smem){

asm volatile (R"({
.reg .b16 rs<203>;
.reg .b32 r<3433>;
.reg .f64 fd<174>;
.reg .b64 rd<3>;
mov.f64 fd123, 0d3FD3C6EF372FE950;
{
cvt.rn.f16.f64 rs1, fd123;
}
mov.b32 r210, {rs1, rs1};
mov.f64 fd130, 0dBFEE6F0E134454FF;
{
cvt.rn.f16.f64 rs2, fd130;
}
mov.b32 r228, {rs2, rs2};
mov.f64 fd135, 0dBFE9E3779B97F4A8;
{
cvt.rn.f16.f64 rs3, fd135;
}
mov.b32 r282, {rs3, rs3};
mov.f64 fd136, 0dBFE2CF2304755A5E;
{
cvt.rn.f16.f64 rs4, fd136;
}
mov.b32 r300, {rs4, rs4};
{
cvt.rn.f16.f64 rs5, fd123;
}
mov.b32 r291, {rs5, rs5};
{
cvt.rn.f16.f64 rs6, fd130;
}
{
neg.f16 rs7, rs6;
}
mov.b32 r306, {rs7, rs7};
{
add.f16x2 r1, %66, %63;
}
{
add.f16x2 r4, %67, r1;
}
{
add.f16x2 r7, %69, %65;
}
{
add.f16x2 r10, r4, r7;
}
{
add.f16x2 r13, %61, %68;
}
{
add.f16x2 r16, %62, r13;
}
{
add.f16x2 r19, %64, %60;
}
{
add.f16x2 r22, r16, r19;
}
{
add.f16x2 r25, %66, %63;
}
{
mul.f16x2 r28, r25, r210;
}
{
add.f16x2 r31, %67, r28;
}
{
add.f16x2 r34, %69, %65;
}
{
mul.f16x2 r37, r34, r282;
}
{
add.f16x2 r40, r31, r37;
}
{
sub.f16x2 r43, %61, %68;
}
{
mul.f16x2 r46, r43, r228;
}
{
sub.f16x2 r49, %64, %60;
}
{
mul.f16x2 r52, r49, r300;
}
{
add.f16x2 r55, r46, r52;
}
{
sub.f16x2 r58, r40, r55;
}
{
add.f16x2 r61, %66, %63;
}
{
mul.f16x2 r64, r61, r210;
}
{
add.f16x2 r67, %67, r64;
}
{
add.f16x2 r70, %69, %65;
}
{
mul.f16x2 r73, r70, r282;
}
{
add.f16x2 r76, r67, r73;
}
{
sub.f16x2 r79, %61, %68;
}
{
mul.f16x2 r82, r79, r228;
}
{
sub.f16x2 r85, %64, %60;
}
{
mul.f16x2 r88, r85, r300;
}
{
add.f16x2 r91, r82, r88;
}
{
add.f16x2 r94, r76, r91;
}
{
add.f16x2 r97, %66, %63;
}
{
mul.f16x2 r100, r97, r282;
}
{
add.f16x2 r103, %67, r100;
}
{
add.f16x2 r106, %69, %65;
}
{
mul.f16x2 r109, r106, r291;
}
{
add.f16x2 r112, r103, r109;
}
{
sub.f16x2 r115, %61, %68;
}
{
mul.f16x2 r118, r115, r300;
}
{
sub.f16x2 r121, %64, %60;
}
{
mul.f16x2 r124, r121, r306;
}
{
add.f16x2 r127, r118, r124;
}
{
sub.f16x2 r130, r112, r127;
}
{
add.f16x2 r133, %66, %63;
}
{
mul.f16x2 r136, r133, r282;
}
{
add.f16x2 r139, %67, r136;
}
{
add.f16x2 r142, %69, %65;
}
{
mul.f16x2 r145, r142, r291;
}
{
add.f16x2 r148, r139, r145;
}
{
sub.f16x2 r151, %61, %68;
}
{
mul.f16x2 r154, r151, r300;
}
{
sub.f16x2 r157, %64, %60;
}
{
mul.f16x2 r160, r157, r306;
}
{
add.f16x2 r163, r154, r160;
}
{
add.f16x2 r166, r148, r163;
}
{
add.f16x2 r169, %61, %68;
}
{
mul.f16x2 r172, r169, r210;
}
{
add.f16x2 r175, %62, r172;
}
{
add.f16x2 r178, %64, %60;
}
{
mul.f16x2 r181, r178, r282;
}
{
add.f16x2 r184, r175, r181;
}
{
sub.f16x2 r187, %66, %63;
}
{
mul.f16x2 r190, r187, r228;
}
{
sub.f16x2 r193, %69, %65;
}
{
mul.f16x2 r196, r193, r300;
}
{
add.f16x2 r199, r190, r196;
}
{
add.f16x2 r202, r184, r199;
}
{
add.f16x2 r205, %61, %68;
}
{
mul.f16x2 r208, r205, r210;
}
{
add.f16x2 r211, %62, r208;
}
{
add.f16x2 r214, %64, %60;
}
{
mul.f16x2 r217, r214, r282;
}
{
add.f16x2 r220, r211, r217;
}
{
sub.f16x2 r223, %66, %63;
}
{
mul.f16x2 r226, r223, r228;
}
{
sub.f16x2 r229, %69, %65;
}
{
mul.f16x2 r232, r229, r300;
}
{
add.f16x2 r235, r226, r232;
}
{
sub.f16x2 r238, r220, r235;
}
{
add.f16x2 r241, %61, %68;
}
{
mul.f16x2 r244, r241, r282;
}
{
add.f16x2 r247, %62, r244;
}
{
add.f16x2 r250, %64, %60;
}
{
mul.f16x2 r253, r250, r291;
}
{
add.f16x2 r256, r247, r253;
}
{
sub.f16x2 r259, %66, %63;
}
{
mul.f16x2 r262, r259, r300;
}
{
sub.f16x2 r265, %69, %65;
}
{
mul.f16x2 r268, r265, r306;
}
{
add.f16x2 r271, r262, r268;
}
{
add.f16x2 r274, r256, r271;
}
{
add.f16x2 r277, %61, %68;
}
{
mul.f16x2 r280, r277, r282;
}
{
add.f16x2 r283, %62, r280;
}
{
add.f16x2 r286, %64, %60;
}
{
mul.f16x2 r289, r286, r291;
}
{
add.f16x2 r292, r283, r289;
}
{
sub.f16x2 r295, %66, %63;
}
{
mul.f16x2 r298, r295, r300;
}
{
sub.f16x2 r301, %69, %65;
}
{
mul.f16x2 r304, r301, r306;
}
{
add.f16x2 r307, r298, r304;
}
{
sub.f16x2 r310, r292, r307;
}
{
cvt.rn.f16.f64 rs9, fd123;
}
mov.b32 r522, {rs9, rs9};
{
cvt.rn.f16.f64 rs10, fd130;
}
mov.b32 r540, {rs10, rs10};
{
cvt.rn.f16.f64 rs11, fd135;
}
mov.b32 r594, {rs11, rs11};
{
cvt.rn.f16.f64 rs12, fd136;
}
mov.b32 r612, {rs12, rs12};
{
cvt.rn.f16.f64 rs13, fd123;
}
mov.b32 r603, {rs13, rs13};
{
cvt.rn.f16.f64 rs14, fd130;
}
{
neg.f16 rs15, rs14;
}
mov.b32 r618, {rs15, rs15};
{
add.f16x2 r313, %74, %71;
}
{
add.f16x2 r316, %75, r313;
}
{
add.f16x2 r319, %77, %73;
}
{
add.f16x2 r322, r316, r319;
}
{
add.f16x2 r325, %79, %76;
}
{
add.f16x2 r328, %70, r325;
}
{
add.f16x2 r331, %72, %78;
}
{
add.f16x2 r334, r328, r331;
}
{
add.f16x2 r337, %74, %71;
}
{
mul.f16x2 r340, r337, r522;
}
{
add.f16x2 r343, %75, r340;
}
{
add.f16x2 r346, %77, %73;
}
{
mul.f16x2 r349, r346, r594;
}
{
add.f16x2 r352, r343, r349;
}
{
sub.f16x2 r355, %79, %76;
}
{
mul.f16x2 r358, r355, r540;
}
{
sub.f16x2 r361, %72, %78;
}
{
mul.f16x2 r364, r361, r612;
}
{
add.f16x2 r367, r358, r364;
}
{
sub.f16x2 r370, r352, r367;
}
{
add.f16x2 r373, %74, %71;
}
{
mul.f16x2 r376, r373, r522;
}
{
add.f16x2 r379, %75, r376;
}
{
add.f16x2 r382, %77, %73;
}
{
mul.f16x2 r385, r382, r594;
}
{
add.f16x2 r388, r379, r385;
}
{
sub.f16x2 r391, %79, %76;
}
{
mul.f16x2 r394, r391, r540;
}
{
sub.f16x2 r397, %72, %78;
}
{
mul.f16x2 r400, r397, r612;
}
{
add.f16x2 r403, r394, r400;
}
{
add.f16x2 r406, r388, r403;
}
{
add.f16x2 r409, %74, %71;
}
{
mul.f16x2 r412, r409, r594;
}
{
add.f16x2 r415, %75, r412;
}
{
add.f16x2 r418, %77, %73;
}
{
mul.f16x2 r421, r418, r603;
}
{
add.f16x2 r424, r415, r421;
}
{
sub.f16x2 r427, %79, %76;
}
{
mul.f16x2 r430, r427, r612;
}
{
sub.f16x2 r433, %72, %78;
}
{
mul.f16x2 r436, r433, r618;
}
{
add.f16x2 r439, r430, r436;
}
{
sub.f16x2 r442, r424, r439;
}
{
add.f16x2 r445, %74, %71;
}
{
mul.f16x2 r448, r445, r594;
}
{
add.f16x2 r451, %75, r448;
}
{
add.f16x2 r454, %77, %73;
}
{
mul.f16x2 r457, r454, r603;
}
{
add.f16x2 r460, r451, r457;
}
{
sub.f16x2 r463, %79, %76;
}
{
mul.f16x2 r466, r463, r612;
}
{
sub.f16x2 r469, %72, %78;
}
{
mul.f16x2 r472, r469, r618;
}
{
add.f16x2 r475, r466, r472;
}
{
add.f16x2 r478, r460, r475;
}
{
add.f16x2 r481, %79, %76;
}
{
mul.f16x2 r484, r481, r522;
}
{
add.f16x2 r487, %70, r484;
}
{
add.f16x2 r490, %72, %78;
}
{
mul.f16x2 r493, r490, r594;
}
{
add.f16x2 r496, r487, r493;
}
{
sub.f16x2 r499, %74, %71;
}
{
mul.f16x2 r502, r499, r540;
}
{
sub.f16x2 r505, %77, %73;
}
{
mul.f16x2 r508, r505, r612;
}
{
add.f16x2 r511, r502, r508;
}
{
add.f16x2 r514, r496, r511;
}
{
add.f16x2 r517, %79, %76;
}
{
mul.f16x2 r520, r517, r522;
}
{
add.f16x2 r523, %70, r520;
}
{
add.f16x2 r526, %72, %78;
}
{
mul.f16x2 r529, r526, r594;
}
{
add.f16x2 r532, r523, r529;
}
{
sub.f16x2 r535, %74, %71;
}
{
mul.f16x2 r538, r535, r540;
}
{
sub.f16x2 r541, %77, %73;
}
{
mul.f16x2 r544, r541, r612;
}
{
add.f16x2 r547, r538, r544;
}
{
sub.f16x2 r550, r532, r547;
}
{
add.f16x2 r553, %79, %76;
}
{
mul.f16x2 r556, r553, r594;
}
{
add.f16x2 r559, %70, r556;
}
{
add.f16x2 r562, %72, %78;
}
{
mul.f16x2 r565, r562, r603;
}
{
add.f16x2 r568, r559, r565;
}
{
sub.f16x2 r571, %74, %71;
}
{
mul.f16x2 r574, r571, r612;
}
{
sub.f16x2 r577, %77, %73;
}
{
mul.f16x2 r580, r577, r618;
}
{
add.f16x2 r583, r574, r580;
}
{
add.f16x2 r586, r568, r583;
}
{
add.f16x2 r589, %79, %76;
}
{
mul.f16x2 r592, r589, r594;
}
{
add.f16x2 r595, %70, r592;
}
{
add.f16x2 r598, %72, %78;
}
{
mul.f16x2 r601, r598, r603;
}
{
add.f16x2 r604, r595, r601;
}
{
sub.f16x2 r607, %74, %71;
}
{
mul.f16x2 r610, r607, r612;
}
{
sub.f16x2 r613, %77, %73;
}
{
mul.f16x2 r616, r613, r618;
}
{
add.f16x2 r619, r610, r616;
}
{
sub.f16x2 r622, r604, r619;
}
{
cvt.rn.f16.f64 rs17, fd123;
}
mov.b32 r834, {rs17, rs17};
{
cvt.rn.f16.f64 rs18, fd130;
}
mov.b32 r852, {rs18, rs18};
{
cvt.rn.f16.f64 rs19, fd135;
}
mov.b32 r906, {rs19, rs19};
{
cvt.rn.f16.f64 rs20, fd136;
}
mov.b32 r924, {rs20, rs20};
{
cvt.rn.f16.f64 rs21, fd123;
}
mov.b32 r915, {rs21, rs21};
{
cvt.rn.f16.f64 rs22, fd130;
}
{
neg.f16 rs23, rs22;
}
mov.b32 r930, {rs23, rs23};
{
add.f16x2 r625, %81, %88;
}
{
add.f16x2 r628, %82, r625;
}
{
add.f16x2 r631, %84, %80;
}
{
add.f16x2 r634, r628, r631;
}
{
add.f16x2 r637, %86, %83;
}
{
add.f16x2 r640, %87, r637;
}
{
add.f16x2 r643, %89, %85;
}
{
add.f16x2 r646, r640, r643;
}
{
add.f16x2 r649, %81, %88;
}
{
mul.f16x2 r652, r649, r834;
}
{
add.f16x2 r655, %82, r652;
}
{
add.f16x2 r658, %84, %80;
}
{
mul.f16x2 r661, r658, r906;
}
{
add.f16x2 r664, r655, r661;
}
{
sub.f16x2 r667, %86, %83;
}
{
mul.f16x2 r670, r667, r852;
}
{
sub.f16x2 r673, %89, %85;
}
{
mul.f16x2 r676, r673, r924;
}
{
add.f16x2 r679, r670, r676;
}
{
sub.f16x2 r682, r664, r679;
}
{
add.f16x2 r685, %81, %88;
}
{
mul.f16x2 r688, r685, r834;
}
{
add.f16x2 r691, %82, r688;
}
{
add.f16x2 r694, %84, %80;
}
{
mul.f16x2 r697, r694, r906;
}
{
add.f16x2 r700, r691, r697;
}
{
sub.f16x2 r703, %86, %83;
}
{
mul.f16x2 r706, r703, r852;
}
{
sub.f16x2 r709, %89, %85;
}
{
mul.f16x2 r712, r709, r924;
}
{
add.f16x2 r715, r706, r712;
}
{
add.f16x2 r718, r700, r715;
}
{
add.f16x2 r721, %81, %88;
}
{
mul.f16x2 r724, r721, r906;
}
{
add.f16x2 r727, %82, r724;
}
{
add.f16x2 r730, %84, %80;
}
{
mul.f16x2 r733, r730, r915;
}
{
add.f16x2 r736, r727, r733;
}
{
sub.f16x2 r739, %86, %83;
}
{
mul.f16x2 r742, r739, r924;
}
{
sub.f16x2 r745, %89, %85;
}
{
mul.f16x2 r748, r745, r930;
}
{
add.f16x2 r751, r742, r748;
}
{
sub.f16x2 r754, r736, r751;
}
{
add.f16x2 r757, %81, %88;
}
{
mul.f16x2 r760, r757, r906;
}
{
add.f16x2 r763, %82, r760;
}
{
add.f16x2 r766, %84, %80;
}
{
mul.f16x2 r769, r766, r915;
}
{
add.f16x2 r772, r763, r769;
}
{
sub.f16x2 r775, %86, %83;
}
{
mul.f16x2 r778, r775, r924;
}
{
sub.f16x2 r781, %89, %85;
}
{
mul.f16x2 r784, r781, r930;
}
{
add.f16x2 r787, r778, r784;
}
{
add.f16x2 r790, r772, r787;
}
{
add.f16x2 r793, %86, %83;
}
{
mul.f16x2 r796, r793, r834;
}
{
add.f16x2 r799, %87, r796;
}
{
add.f16x2 r802, %89, %85;
}
{
mul.f16x2 r805, r802, r906;
}
{
add.f16x2 r808, r799, r805;
}
{
sub.f16x2 r811, %81, %88;
}
{
mul.f16x2 r814, r811, r852;
}
{
sub.f16x2 r817, %84, %80;
}
{
mul.f16x2 r820, r817, r924;
}
{
add.f16x2 r823, r814, r820;
}
{
add.f16x2 r826, r808, r823;
}
{
add.f16x2 r829, %86, %83;
}
{
mul.f16x2 r832, r829, r834;
}
{
add.f16x2 r835, %87, r832;
}
{
add.f16x2 r838, %89, %85;
}
{
mul.f16x2 r841, r838, r906;
}
{
add.f16x2 r844, r835, r841;
}
{
sub.f16x2 r847, %81, %88;
}
{
mul.f16x2 r850, r847, r852;
}
{
sub.f16x2 r853, %84, %80;
}
{
mul.f16x2 r856, r853, r924;
}
{
add.f16x2 r859, r850, r856;
}
{
sub.f16x2 r862, r844, r859;
}
{
add.f16x2 r865, %86, %83;
}
{
mul.f16x2 r868, r865, r906;
}
{
add.f16x2 r871, %87, r868;
}
{
add.f16x2 r874, %89, %85;
}
{
mul.f16x2 r877, r874, r915;
}
{
add.f16x2 r880, r871, r877;
}
{
sub.f16x2 r883, %81, %88;
}
{
mul.f16x2 r886, r883, r924;
}
{
sub.f16x2 r889, %84, %80;
}
{
mul.f16x2 r892, r889, r930;
}
{
add.f16x2 r895, r886, r892;
}
{
add.f16x2 r898, r880, r895;
}
{
add.f16x2 r901, %86, %83;
}
{
mul.f16x2 r904, r901, r906;
}
{
add.f16x2 r907, %87, r904;
}
{
add.f16x2 r910, %89, %85;
}
{
mul.f16x2 r913, r910, r915;
}
{
add.f16x2 r916, r907, r913;
}
{
sub.f16x2 r919, %81, %88;
}
{
mul.f16x2 r922, r919, r924;
}
{
sub.f16x2 r925, %84, %80;
}
{
mul.f16x2 r928, r925, r930;
}
{
add.f16x2 r931, r922, r928;
}
{
sub.f16x2 r934, r916, r931;
}
mov.f64 fd115, 0d3FED3BC3AEFF7F95;
{
cvt.rn.f16.f64 rs25, fd115;
}
mov.f64 fd138, 0dBFDA07F921061AD1;
{
cvt.rn.f16.f64 rs26, fd138;
}
mov.f64 fd119, 0d3FE5698496E20BD8;
{
cvt.rn.f16.f64 rs27, fd119;
}
mov.f64 fd134, 0dBFE7C7D7A833BEC2;
{
cvt.rn.f16.f64 rs28, fd134;
}
{
cvt.rn.f16.f64 rs29, fd123;
}
{
cvt.rn.f16.f64 rs30, fd130;
}
mov.f64 fd127, 0dBFBAC2609B3C576C;
{
cvt.rn.f16.f64 rs31, fd127;
}
mov.f64 fd128, 0dBFEFD31F94F867C6;
{
cvt.rn.f16.f64 rs32, fd128;
}
{
cvt.rn.f16.f64 rs35, fd135;
}
{
cvt.rn.f16.f64 rs36, fd136;
}
mov.f64 fd139, 0dBFEF4CFC327A0080;
{
cvt.rn.f16.f64 rs39, fd139;
}
mov.f64 fd90, 0d3FCA9CD9AC4258F6;
{
cvt.rn.f16.f64 rs40, fd90;
}
mov.b32 r951, {rs25, rs25};
{
mul.f16x2 r937, r370, r951;
}
mov.b32 r948, {rs26, rs26};
{
mul.f16x2 r940, r514, r948;
}
{
sub.f16x2 r943, r937, r940;
}
{
mul.f16x2 r946, r370, r948;
}
{
fma.rn.f16x2 r949, r514, r951, r946;
}
mov.b32 r983, {rs27, rs27};
{
mul.f16x2 r953, r682, r983;
}
mov.b32 r980, {rs28, rs28};
{
mul.f16x2 r956, r826, r980;
}
{
sub.f16x2 r959, r953, r956;
}
{
mul.f16x2 r962, r682, r980;
}
{
fma.rn.f16x2 r965, r826, r983, r962;
}
{
mul.f16x2 r969, r442, r983;
}
{
mul.f16x2 r972, r586, r980;
}
{
sub.f16x2 r975, r969, r972;
}
{
mul.f16x2 r978, r442, r980;
}
{
fma.rn.f16x2 r981, r586, r983, r978;
}
mov.b32 r1047, {rs31, rs31};
{
mul.f16x2 r985, r754, r1047;
}
mov.b32 r1044, {rs32, rs32};
{
mul.f16x2 r988, r898, r1044;
}
{
sub.f16x2 r991, r985, r988;
}
{
mul.f16x2 r994, r754, r1044;
}
{
fma.rn.f16x2 r997, r898, r1047, r994;
}
mov.b32 r1015, {rs29, rs29};
{
mul.f16x2 r1001, r478, r1015;
}
mov.b32 r1012, {rs30, rs30};
{
mul.f16x2 r1004, r622, r1012;
}
{
sub.f16x2 r1007, r1001, r1004;
}
{
mul.f16x2 r1010, r478, r1012;
}
{
fma.rn.f16x2 r1013, r622, r1015, r1010;
}
mov.b32 r1031, {rs35, rs35};
{
mul.f16x2 r1017, r790, r1031;
}
mov.b32 r1028, {rs36, rs36};
{
mul.f16x2 r1020, r934, r1028;
}
{
sub.f16x2 r1023, r1017, r1020;
}
{
mul.f16x2 r1026, r790, r1028;
}
{
fma.rn.f16x2 r1029, r934, r1031, r1026;
}
{
mul.f16x2 r1033, r406, r1047;
}
{
mul.f16x2 r1036, r550, r1044;
}
{
sub.f16x2 r1039, r1033, r1036;
}
{
mul.f16x2 r1042, r406, r1044;
}
{
fma.rn.f16x2 r1045, r550, r1047, r1042;
}
mov.b32 r1063, {rs39, rs39};
{
mul.f16x2 r1049, r718, r1063;
}
mov.b32 r1060, {rs40, rs40};
mov.f64 fd173, 0dBFE0000000000000;
{
mul.f16x2 r1052, r862, r1060;
}
{
sub.f16x2 r1055, r1049, r1052;
}
{
mul.f16x2 r1058, r718, r1060;
}
{
fma.rn.f16x2 r1061, r862, r1063, r1058;
}
{
cvt.rn.f16.f64 rs53, fd173;
}
mov.b32 r1136, {rs53, rs53};
mov.f64 fd172, 0dBFEBB67AE8584CAA;
{
cvt.rn.f16.f64 rs54, fd172;
}
{
neg.f16 rs55, rs54;
}
mov.b32 r1145, {rs55, rs55};
{
add.f16x2 r1065, r322, r634;
}
{
add.f16x2 r1068, r10, r1065;
}
{
add.f16x2 r1071, r334, r646;
}
{
add.f16x2 r1074, r22, r1071;
}
{
add.f16x2 r1077, r322, r634;
}
{
mul.f16x2 r1080, r1077, r1136;
}
{
add.f16x2 r1083, r10, r1080;
}
{
sub.f16x2 r1086, r334, r646;
}
{
mul.f16x2 r1089, r1086, r1145;
}
{
add.f16x2 r1092, r1083, r1089;
}
{
add.f16x2 r1095, r322, r634;
}
{
mul.f16x2 r1098, r1095, r1136;
}
{
add.f16x2 r1101, r10, r1098;
}
{
sub.f16x2 r1104, r334, r646;
}
{
mul.f16x2 r1107, r1104, r1145;
}
{
sub.f16x2 r1110, r1101, r1107;
}
{
add.f16x2 r1113, r334, r646;
}
{
mul.f16x2 r1116, r1113, r1136;
}
{
add.f16x2 r1119, r22, r1116;
}
{
sub.f16x2 r1122, r322, r634;
}
{
mul.f16x2 r1125, r1122, r1145;
}
{
sub.f16x2 r1128, r1119, r1125;
}
{
add.f16x2 r1131, r334, r646;
}
{
mul.f16x2 r1134, r1131, r1136;
}
{
add.f16x2 r1137, r22, r1134;
}
{
sub.f16x2 r1140, r322, r634;
}
{
mul.f16x2 r1143, r1140, r1145;
}
{
add.f16x2 r1146, r1137, r1143;
}
{
cvt.rn.f16.f64 rs57, fd173;
}
mov.b32 r1220, {rs57, rs57};
{
cvt.rn.f16.f64 rs58, fd172;
}
{
neg.f16 rs59, rs58;
}
mov.b32 r1229, {rs59, rs59};
{
add.f16x2 r1149, r943, r959;
}
{
add.f16x2 r1152, r58, r1149;
}
{
add.f16x2 r1155, r949, r965;
}
{
add.f16x2 r1158, r202, r1155;
}
{
add.f16x2 r1161, r943, r959;
}
{
mul.f16x2 r1164, r1161, r1220;
}
{
add.f16x2 r1167, r58, r1164;
}
{
sub.f16x2 r1170, r949, r965;
}
{
mul.f16x2 r1173, r1170, r1229;
}
{
add.f16x2 r1176, r1167, r1173;
}
{
add.f16x2 r1179, r943, r959;
}
{
mul.f16x2 r1182, r1179, r1220;
}
{
add.f16x2 r1185, r58, r1182;
}
{
sub.f16x2 r1188, r949, r965;
}
{
mul.f16x2 r1191, r1188, r1229;
}
{
sub.f16x2 r1194, r1185, r1191;
}
{
add.f16x2 r1197, r949, r965;
}
{
mul.f16x2 r1200, r1197, r1220;
}
{
add.f16x2 r1203, r202, r1200;
}
{
sub.f16x2 r1206, r943, r959;
}
{
mul.f16x2 r1209, r1206, r1229;
}
{
sub.f16x2 r1212, r1203, r1209;
}
{
add.f16x2 r1215, r949, r965;
}
{
mul.f16x2 r1218, r1215, r1220;
}
{
add.f16x2 r1221, r202, r1218;
}
{
sub.f16x2 r1224, r943, r959;
}
{
mul.f16x2 r1227, r1224, r1229;
}
{
add.f16x2 r1230, r1221, r1227;
}
{
cvt.rn.f16.f64 rs61, fd173;
}
mov.b32 r1304, {rs61, rs61};
{
cvt.rn.f16.f64 rs62, fd172;
}
{
neg.f16 rs63, rs62;
}
mov.b32 r1313, {rs63, rs63};
{
add.f16x2 r1233, r975, r991;
}
{
add.f16x2 r1236, r130, r1233;
}
{
add.f16x2 r1239, r981, r997;
}
{
add.f16x2 r1242, r274, r1239;
}
{
add.f16x2 r1245, r975, r991;
}
{
mul.f16x2 r1248, r1245, r1304;
}
{
add.f16x2 r1251, r130, r1248;
}
{
sub.f16x2 r1254, r981, r997;
}
{
mul.f16x2 r1257, r1254, r1313;
}
{
add.f16x2 r1260, r1251, r1257;
}
{
add.f16x2 r1263, r975, r991;
}
{
mul.f16x2 r1266, r1263, r1304;
}
{
add.f16x2 r1269, r130, r1266;
}
{
sub.f16x2 r1272, r981, r997;
}
{
mul.f16x2 r1275, r1272, r1313;
}
{
sub.f16x2 r1278, r1269, r1275;
}
{
add.f16x2 r1281, r981, r997;
}
{
mul.f16x2 r1284, r1281, r1304;
}
{
add.f16x2 r1287, r274, r1284;
}
{
sub.f16x2 r1290, r975, r991;
}
{
mul.f16x2 r1293, r1290, r1313;
}
{
sub.f16x2 r1296, r1287, r1293;
}
{
add.f16x2 r1299, r981, r997;
}
{
mul.f16x2 r1302, r1299, r1304;
}
{
add.f16x2 r1305, r274, r1302;
}
{
sub.f16x2 r1308, r975, r991;
}
{
mul.f16x2 r1311, r1308, r1313;
}
{
add.f16x2 r1314, r1305, r1311;
}
{
cvt.rn.f16.f64 rs65, fd173;
}
mov.b32 r1388, {rs65, rs65};
{
cvt.rn.f16.f64 rs66, fd172;
}
{
neg.f16 rs67, rs66;
}
mov.b32 r1397, {rs67, rs67};
{
add.f16x2 r1317, r1007, r1023;
}
{
add.f16x2 r1320, r166, r1317;
}
{
add.f16x2 r1323, r1013, r1029;
}
{
add.f16x2 r1326, r310, r1323;
}
{
add.f16x2 r1329, r1007, r1023;
}
{
mul.f16x2 r1332, r1329, r1388;
}
{
add.f16x2 r1335, r166, r1332;
}
{
sub.f16x2 r1338, r1013, r1029;
}
{
mul.f16x2 r1341, r1338, r1397;
}
{
add.f16x2 r1344, r1335, r1341;
}
{
add.f16x2 r1347, r1007, r1023;
}
{
mul.f16x2 r1350, r1347, r1388;
}
{
add.f16x2 r1353, r166, r1350;
}
{
sub.f16x2 r1356, r1013, r1029;
}
{
mul.f16x2 r1359, r1356, r1397;
}
{
sub.f16x2 r1362, r1353, r1359;
}
{
add.f16x2 r1365, r1013, r1029;
}
{
mul.f16x2 r1368, r1365, r1388;
}
{
add.f16x2 r1371, r310, r1368;
}
{
sub.f16x2 r1374, r1007, r1023;
}
{
mul.f16x2 r1377, r1374, r1397;
}
{
sub.f16x2 r1380, r1371, r1377;
}
{
add.f16x2 r1383, r1013, r1029;
}
{
mul.f16x2 r1386, r1383, r1388;
}
{
add.f16x2 r1389, r310, r1386;
}
{
sub.f16x2 r1392, r1007, r1023;
}
{
mul.f16x2 r1395, r1392, r1397;
}
{
add.f16x2 r1398, r1389, r1395;
}
{
cvt.rn.f16.f64 rs69, fd173;
}
mov.b32 r1472, {rs69, rs69};
{
cvt.rn.f16.f64 rs70, fd172;
}
{
neg.f16 rs71, rs70;
}
mov.b32 r1481, {rs71, rs71};
{
add.f16x2 r1401, r1039, r1055;
}
{
add.f16x2 r1404, r94, r1401;
}
{
add.f16x2 r1407, r1045, r1061;
}
{
add.f16x2 r1410, r238, r1407;
}
{
add.f16x2 r1413, r1039, r1055;
}
{
mul.f16x2 r1416, r1413, r1472;
}
{
add.f16x2 r1419, r94, r1416;
}
{
sub.f16x2 r1422, r1045, r1061;
}
{
mul.f16x2 r1425, r1422, r1481;
}
{
add.f16x2 r1428, r1419, r1425;
}
{
add.f16x2 r1431, r1039, r1055;
}
{
mul.f16x2 r1434, r1431, r1472;
}
{
add.f16x2 r1437, r94, r1434;
}
{
sub.f16x2 r1440, r1045, r1061;
}
{
mul.f16x2 r1443, r1440, r1481;
}
{
sub.f16x2 r1446, r1437, r1443;
}
{
add.f16x2 r1449, r1045, r1061;
}
{
mul.f16x2 r1452, r1449, r1472;
}
{
add.f16x2 r1455, r238, r1452;
}
{
sub.f16x2 r1458, r1039, r1055;
}
{
mul.f16x2 r1461, r1458, r1481;
}
{
sub.f16x2 r1464, r1455, r1461;
}
{
add.f16x2 r1467, r1045, r1061;
}
{
mul.f16x2 r1470, r1467, r1472;
}
{
add.f16x2 r1473, r238, r1470;
}
{
sub.f16x2 r1476, r1039, r1055;
}
{
mul.f16x2 r1479, r1476, r1481;
}
{
add.f16x2 r1482, r1473, r1479;
}
{
cvt.rn.f16.f64 rs73, fd123;
}
mov.b32 r1694, {rs73, rs73};
{
cvt.rn.f16.f64 rs74, fd130;
}
mov.b32 r1712, {rs74, rs74};
{
cvt.rn.f16.f64 rs75, fd135;
}
mov.b32 r1766, {rs75, rs75};
{
cvt.rn.f16.f64 rs76, fd136;
}
mov.b32 r1784, {rs76, rs76};
{
cvt.rn.f16.f64 rs77, fd123;
}
mov.b32 r1775, {rs77, rs77};
{
cvt.rn.f16.f64 rs78, fd130;
}
{
neg.f16 rs79, rs78;
}
mov.b32 r1790, {rs79, rs79};
{
add.f16x2 r1485, %96, %93;
}
{
add.f16x2 r1488, %97, r1485;
}
{
add.f16x2 r1491, %99, %95;
}
{
add.f16x2 r1494, r1488, r1491;
}
{
add.f16x2 r1497, %91, %98;
}
{
add.f16x2 r1500, %92, r1497;
}
{
add.f16x2 r1503, %94, %90;
}
{
add.f16x2 r1506, r1500, r1503;
}
{
add.f16x2 r1509, %96, %93;
}
{
mul.f16x2 r1512, r1509, r1694;
}
{
add.f16x2 r1515, %97, r1512;
}
{
add.f16x2 r1518, %99, %95;
}
{
mul.f16x2 r1521, r1518, r1766;
}
{
add.f16x2 r1524, r1515, r1521;
}
{
sub.f16x2 r1527, %91, %98;
}
{
mul.f16x2 r1530, r1527, r1712;
}
{
sub.f16x2 r1533, %94, %90;
}
{
mul.f16x2 r1536, r1533, r1784;
}
{
add.f16x2 r1539, r1530, r1536;
}
{
sub.f16x2 r1542, r1524, r1539;
}
{
add.f16x2 r1545, %96, %93;
}
{
mul.f16x2 r1548, r1545, r1694;
}
{
add.f16x2 r1551, %97, r1548;
}
{
add.f16x2 r1554, %99, %95;
}
{
mul.f16x2 r1557, r1554, r1766;
}
{
add.f16x2 r1560, r1551, r1557;
}
{
sub.f16x2 r1563, %91, %98;
}
{
mul.f16x2 r1566, r1563, r1712;
}
{
sub.f16x2 r1569, %94, %90;
}
{
mul.f16x2 r1572, r1569, r1784;
}
{
add.f16x2 r1575, r1566, r1572;
}
{
add.f16x2 r1578, r1560, r1575;
}
{
add.f16x2 r1581, %96, %93;
}
{
mul.f16x2 r1584, r1581, r1766;
}
{
add.f16x2 r1587, %97, r1584;
}
{
add.f16x2 r1590, %99, %95;
}
{
mul.f16x2 r1593, r1590, r1775;
}
{
add.f16x2 r1596, r1587, r1593;
}
{
sub.f16x2 r1599, %91, %98;
}
{
mul.f16x2 r1602, r1599, r1784;
}
{
sub.f16x2 r1605, %94, %90;
}
{
mul.f16x2 r1608, r1605, r1790;
}
{
add.f16x2 r1611, r1602, r1608;
}
{
sub.f16x2 r1614, r1596, r1611;
}
{
add.f16x2 r1617, %96, %93;
}
{
mul.f16x2 r1620, r1617, r1766;
}
{
add.f16x2 r1623, %97, r1620;
}
{
add.f16x2 r1626, %99, %95;
}
{
mul.f16x2 r1629, r1626, r1775;
}
{
add.f16x2 r1632, r1623, r1629;
}
{
sub.f16x2 r1635, %91, %98;
}
{
mul.f16x2 r1638, r1635, r1784;
}
{
sub.f16x2 r1641, %94, %90;
}
{
mul.f16x2 r1644, r1641, r1790;
}
{
add.f16x2 r1647, r1638, r1644;
}
{
add.f16x2 r1650, r1632, r1647;
}
{
add.f16x2 r1653, %91, %98;
}
{
mul.f16x2 r1656, r1653, r1694;
}
{
add.f16x2 r1659, %92, r1656;
}
{
add.f16x2 r1662, %94, %90;
}
{
mul.f16x2 r1665, r1662, r1766;
}
{
add.f16x2 r1668, r1659, r1665;
}
{
sub.f16x2 r1671, %96, %93;
}
{
mul.f16x2 r1674, r1671, r1712;
}
{
sub.f16x2 r1677, %99, %95;
}
{
mul.f16x2 r1680, r1677, r1784;
}
{
add.f16x2 r1683, r1674, r1680;
}
{
add.f16x2 r1686, r1668, r1683;
}
{
add.f16x2 r1689, %91, %98;
}
{
mul.f16x2 r1692, r1689, r1694;
}
{
add.f16x2 r1695, %92, r1692;
}
{
add.f16x2 r1698, %94, %90;
}
{
mul.f16x2 r1701, r1698, r1766;
}
{
add.f16x2 r1704, r1695, r1701;
}
{
sub.f16x2 r1707, %96, %93;
}
{
mul.f16x2 r1710, r1707, r1712;
}
{
sub.f16x2 r1713, %99, %95;
}
{
mul.f16x2 r1716, r1713, r1784;
}
{
add.f16x2 r1719, r1710, r1716;
}
{
sub.f16x2 r1722, r1704, r1719;
}
{
add.f16x2 r1725, %91, %98;
}
{
mul.f16x2 r1728, r1725, r1766;
}
{
add.f16x2 r1731, %92, r1728;
}
{
add.f16x2 r1734, %94, %90;
}
{
mul.f16x2 r1737, r1734, r1775;
}
{
add.f16x2 r1740, r1731, r1737;
}
{
sub.f16x2 r1743, %96, %93;
}
{
mul.f16x2 r1746, r1743, r1784;
}
{
sub.f16x2 r1749, %99, %95;
}
{
mul.f16x2 r1752, r1749, r1790;
}
{
add.f16x2 r1755, r1746, r1752;
}
{
add.f16x2 r1758, r1740, r1755;
}
{
add.f16x2 r1761, %91, %98;
}
{
mul.f16x2 r1764, r1761, r1766;
}
{
add.f16x2 r1767, %92, r1764;
}
{
add.f16x2 r1770, %94, %90;
}
{
mul.f16x2 r1773, r1770, r1775;
}
{
add.f16x2 r1776, r1767, r1773;
}
{
sub.f16x2 r1779, %96, %93;
}
{
mul.f16x2 r1782, r1779, r1784;
}
{
sub.f16x2 r1785, %99, %95;
}
{
mul.f16x2 r1788, r1785, r1790;
}
{
add.f16x2 r1791, r1782, r1788;
}
{
sub.f16x2 r1794, r1776, r1791;
}
{
cvt.rn.f16.f64 rs81, fd123;
}
mov.b32 r2006, {rs81, rs81};
{
cvt.rn.f16.f64 rs82, fd130;
}
mov.b32 r2024, {rs82, rs82};
{
cvt.rn.f16.f64 rs83, fd135;
}
mov.b32 r2078, {rs83, rs83};
{
cvt.rn.f16.f64 rs84, fd136;
}
mov.b32 r2096, {rs84, rs84};
{
cvt.rn.f16.f64 rs85, fd123;
}
mov.b32 r2087, {rs85, rs85};
{
cvt.rn.f16.f64 rs86, fd130;
}
{
neg.f16 rs87, rs86;
}
mov.b32 r2102, {rs87, rs87};
{
add.f16x2 r1797, %103, %101;
}
{
add.f16x2 r1800, %105, r1797;
}
{
add.f16x2 r1803, %107, %104;
}
{
add.f16x2 r1806, r1800, r1803;
}
{
add.f16x2 r1809, %109, %106;
}
{
add.f16x2 r1812, %100, r1809;
}
{
add.f16x2 r1815, %102, %108;
}
{
add.f16x2 r1818, r1812, r1815;
}
{
add.f16x2 r1821, %103, %101;
}
{
mul.f16x2 r1824, r1821, r2006;
}
{
add.f16x2 r1827, %105, r1824;
}
{
add.f16x2 r1830, %107, %104;
}
{
mul.f16x2 r1833, r1830, r2078;
}
{
add.f16x2 r1836, r1827, r1833;
}
{
sub.f16x2 r1839, %109, %106;
}
{
mul.f16x2 r1842, r1839, r2024;
}
{
sub.f16x2 r1845, %102, %108;
}
{
mul.f16x2 r1848, r1845, r2096;
}
{
add.f16x2 r1851, r1842, r1848;
}
{
sub.f16x2 r1854, r1836, r1851;
}
{
add.f16x2 r1857, %103, %101;
}
{
mul.f16x2 r1860, r1857, r2006;
}
{
add.f16x2 r1863, %105, r1860;
}
{
add.f16x2 r1866, %107, %104;
}
{
mul.f16x2 r1869, r1866, r2078;
}
{
add.f16x2 r1872, r1863, r1869;
}
{
sub.f16x2 r1875, %109, %106;
}
{
mul.f16x2 r1878, r1875, r2024;
}
{
sub.f16x2 r1881, %102, %108;
}
{
mul.f16x2 r1884, r1881, r2096;
}
{
add.f16x2 r1887, r1878, r1884;
}
{
add.f16x2 r1890, r1872, r1887;
}
{
add.f16x2 r1893, %103, %101;
}
{
mul.f16x2 r1896, r1893, r2078;
}
{
add.f16x2 r1899, %105, r1896;
}
{
add.f16x2 r1902, %107, %104;
}
{
mul.f16x2 r1905, r1902, r2087;
}
{
add.f16x2 r1908, r1899, r1905;
}
{
sub.f16x2 r1911, %109, %106;
}
{
mul.f16x2 r1914, r1911, r2096;
}
{
sub.f16x2 r1917, %102, %108;
}
{
mul.f16x2 r1920, r1917, r2102;
}
{
add.f16x2 r1923, r1914, r1920;
}
{
sub.f16x2 r1926, r1908, r1923;
}
{
add.f16x2 r1929, %103, %101;
}
{
mul.f16x2 r1932, r1929, r2078;
}
{
add.f16x2 r1935, %105, r1932;
}
{
add.f16x2 r1938, %107, %104;
}
{
mul.f16x2 r1941, r1938, r2087;
}
{
add.f16x2 r1944, r1935, r1941;
}
{
sub.f16x2 r1947, %109, %106;
}
{
mul.f16x2 r1950, r1947, r2096;
}
{
sub.f16x2 r1953, %102, %108;
}
{
mul.f16x2 r1956, r1953, r2102;
}
{
add.f16x2 r1959, r1950, r1956;
}
{
add.f16x2 r1962, r1944, r1959;
}
{
add.f16x2 r1965, %109, %106;
}
{
mul.f16x2 r1968, r1965, r2006;
}
{
add.f16x2 r1971, %100, r1968;
}
{
add.f16x2 r1974, %102, %108;
}
{
mul.f16x2 r1977, r1974, r2078;
}
{
add.f16x2 r1980, r1971, r1977;
}
{
sub.f16x2 r1983, %103, %101;
}
{
mul.f16x2 r1986, r1983, r2024;
}
{
sub.f16x2 r1989, %107, %104;
}
{
mul.f16x2 r1992, r1989, r2096;
}
{
add.f16x2 r1995, r1986, r1992;
}
{
add.f16x2 r1998, r1980, r1995;
}
{
add.f16x2 r2001, %109, %106;
}
{
mul.f16x2 r2004, r2001, r2006;
}
{
add.f16x2 r2007, %100, r2004;
}
{
add.f16x2 r2010, %102, %108;
}
{
mul.f16x2 r2013, r2010, r2078;
}
{
add.f16x2 r2016, r2007, r2013;
}
{
sub.f16x2 r2019, %103, %101;
}
{
mul.f16x2 r2022, r2019, r2024;
}
{
sub.f16x2 r2025, %107, %104;
}
{
mul.f16x2 r2028, r2025, r2096;
}
{
add.f16x2 r2031, r2022, r2028;
}
{
sub.f16x2 r2034, r2016, r2031;
}
{
add.f16x2 r2037, %109, %106;
}
{
mul.f16x2 r2040, r2037, r2078;
}
{
add.f16x2 r2043, %100, r2040;
}
{
add.f16x2 r2046, %102, %108;
}
{
mul.f16x2 r2049, r2046, r2087;
}
{
add.f16x2 r2052, r2043, r2049;
}
{
sub.f16x2 r2055, %103, %101;
}
{
mul.f16x2 r2058, r2055, r2096;
}
{
sub.f16x2 r2061, %107, %104;
}
{
mul.f16x2 r2064, r2061, r2102;
}
{
add.f16x2 r2067, r2058, r2064;
}
{
add.f16x2 r2070, r2052, r2067;
}
{
add.f16x2 r2073, %109, %106;
}
{
mul.f16x2 r2076, r2073, r2078;
}
{
add.f16x2 r2079, %100, r2076;
}
{
add.f16x2 r2082, %102, %108;
}
{
mul.f16x2 r2085, r2082, r2087;
}
{
add.f16x2 r2088, r2079, r2085;
}
{
sub.f16x2 r2091, %103, %101;
}
{
mul.f16x2 r2094, r2091, r2096;
}
{
sub.f16x2 r2097, %107, %104;
}
{
mul.f16x2 r2100, r2097, r2102;
}
{
add.f16x2 r2103, r2094, r2100;
}
{
sub.f16x2 r2106, r2088, r2103;
}
{
cvt.rn.f16.f64 rs89, fd123;
}
mov.b32 r2318, {rs89, rs89};
{
cvt.rn.f16.f64 rs90, fd130;
}
mov.b32 r2336, {rs90, rs90};
{
cvt.rn.f16.f64 rs91, fd135;
}
mov.b32 r2390, {rs91, rs91};
{
cvt.rn.f16.f64 rs92, fd136;
}
mov.b32 r2408, {rs92, rs92};
{
cvt.rn.f16.f64 rs93, fd123;
}
mov.b32 r2399, {rs93, rs93};
{
cvt.rn.f16.f64 rs94, fd130;
}
{
neg.f16 rs95, rs94;
}
mov.b32 r2414, {rs95, rs95};
{
add.f16x2 r2109, %113, %119;
}
{
add.f16x2 r2112, %111, r2109;
}
{
add.f16x2 r2115, %114, %112;
}
{
add.f16x2 r2118, r2112, r2115;
}
{
add.f16x2 r2121, %116, %115;
}
{
add.f16x2 r2124, %118, r2121;
}
{
add.f16x2 r2127, %110, %117;
}
{
add.f16x2 r2130, r2124, r2127;
}
{
add.f16x2 r2133, %113, %119;
}
{
mul.f16x2 r2136, r2133, r2318;
}
{
add.f16x2 r2139, %111, r2136;
}
{
add.f16x2 r2142, %114, %112;
}
{
mul.f16x2 r2145, r2142, r2390;
}
{
add.f16x2 r2148, r2139, r2145;
}
{
sub.f16x2 r2151, %116, %115;
}
{
mul.f16x2 r2154, r2151, r2336;
}
{
sub.f16x2 r2157, %110, %117;
}
{
mul.f16x2 r2160, r2157, r2408;
}
{
add.f16x2 r2163, r2154, r2160;
}
{
sub.f16x2 r2166, r2148, r2163;
}
{
add.f16x2 r2169, %113, %119;
}
{
mul.f16x2 r2172, r2169, r2318;
}
{
add.f16x2 r2175, %111, r2172;
}
{
add.f16x2 r2178, %114, %112;
}
{
mul.f16x2 r2181, r2178, r2390;
}
{
add.f16x2 r2184, r2175, r2181;
}
{
sub.f16x2 r2187, %116, %115;
}
{
mul.f16x2 r2190, r2187, r2336;
}
{
sub.f16x2 r2193, %110, %117;
}
{
mul.f16x2 r2196, r2193, r2408;
}
{
add.f16x2 r2199, r2190, r2196;
}
{
add.f16x2 r2202, r2184, r2199;
}
{
add.f16x2 r2205, %113, %119;
}
{
mul.f16x2 r2208, r2205, r2390;
}
{
add.f16x2 r2211, %111, r2208;
}
{
add.f16x2 r2214, %114, %112;
}
{
mul.f16x2 r2217, r2214, r2399;
}
{
add.f16x2 r2220, r2211, r2217;
}
{
sub.f16x2 r2223, %116, %115;
}
{
mul.f16x2 r2226, r2223, r2408;
}
{
sub.f16x2 r2229, %110, %117;
}
{
mul.f16x2 r2232, r2229, r2414;
}
{
add.f16x2 r2235, r2226, r2232;
}
{
sub.f16x2 r2238, r2220, r2235;
}
{
add.f16x2 r2241, %113, %119;
}
{
mul.f16x2 r2244, r2241, r2390;
}
{
add.f16x2 r2247, %111, r2244;
}
{
add.f16x2 r2250, %114, %112;
}
{
mul.f16x2 r2253, r2250, r2399;
}
{
add.f16x2 r2256, r2247, r2253;
}
{
sub.f16x2 r2259, %116, %115;
}
{
mul.f16x2 r2262, r2259, r2408;
}
{
sub.f16x2 r2265, %110, %117;
}
{
mul.f16x2 r2268, r2265, r2414;
}
{
add.f16x2 r2271, r2262, r2268;
}
{
add.f16x2 r2274, r2256, r2271;
}
{
add.f16x2 r2277, %116, %115;
}
{
mul.f16x2 r2280, r2277, r2318;
}
{
add.f16x2 r2283, %118, r2280;
}
{
add.f16x2 r2286, %110, %117;
}
{
mul.f16x2 r2289, r2286, r2390;
}
{
add.f16x2 r2292, r2283, r2289;
}
{
sub.f16x2 r2295, %113, %119;
}
{
mul.f16x2 r2298, r2295, r2336;
}
{
sub.f16x2 r2301, %114, %112;
}
{
mul.f16x2 r2304, r2301, r2408;
}
{
add.f16x2 r2307, r2298, r2304;
}
{
add.f16x2 r2310, r2292, r2307;
}
{
add.f16x2 r2313, %116, %115;
}
{
mul.f16x2 r2316, r2313, r2318;
}
{
add.f16x2 r2319, %118, r2316;
}
{
add.f16x2 r2322, %110, %117;
}
{
mul.f16x2 r2325, r2322, r2390;
}
{
add.f16x2 r2328, r2319, r2325;
}
{
sub.f16x2 r2331, %113, %119;
}
{
mul.f16x2 r2334, r2331, r2336;
}
{
sub.f16x2 r2337, %114, %112;
}
{
mul.f16x2 r2340, r2337, r2408;
}
{
add.f16x2 r2343, r2334, r2340;
}
{
sub.f16x2 r2346, r2328, r2343;
}
{
add.f16x2 r2349, %116, %115;
}
{
mul.f16x2 r2352, r2349, r2390;
}
{
add.f16x2 r2355, %118, r2352;
}
{
add.f16x2 r2358, %110, %117;
}
{
mul.f16x2 r2361, r2358, r2399;
}
{
add.f16x2 r2364, r2355, r2361;
}
{
sub.f16x2 r2367, %113, %119;
}
{
mul.f16x2 r2370, r2367, r2408;
}
{
sub.f16x2 r2373, %114, %112;
}
{
mul.f16x2 r2376, r2373, r2414;
}
{
add.f16x2 r2379, r2370, r2376;
}
{
add.f16x2 r2382, r2364, r2379;
}
{
add.f16x2 r2385, %116, %115;
}
{
mul.f16x2 r2388, r2385, r2390;
}
{
add.f16x2 r2391, %118, r2388;
}
{
add.f16x2 r2394, %110, %117;
}
{
mul.f16x2 r2397, r2394, r2399;
}
{
add.f16x2 r2400, r2391, r2397;
}
{
sub.f16x2 r2403, %113, %119;
}
{
mul.f16x2 r2406, r2403, r2408;
}
{
sub.f16x2 r2409, %114, %112;
}
{
mul.f16x2 r2412, r2409, r2414;
}
{
add.f16x2 r2415, r2406, r2412;
}
{
sub.f16x2 r2418, r2400, r2415;
}
{
cvt.rn.f16.f64 rs97, fd115;
}
{
cvt.rn.f16.f64 rs98, fd138;
}
{
cvt.rn.f16.f64 rs99, fd119;
}
{
cvt.rn.f16.f64 rs100, fd134;
}
{
cvt.rn.f16.f64 rs101, fd123;
}
{
cvt.rn.f16.f64 rs102, fd130;
}
{
cvt.rn.f16.f64 rs103, fd127;
}
{
cvt.rn.f16.f64 rs104, fd128;
}
{
cvt.rn.f16.f64 rs107, fd135;
}
{
cvt.rn.f16.f64 rs108, fd136;
}
{
cvt.rn.f16.f64 rs111, fd139;
}
{
cvt.rn.f16.f64 rs112, fd90;
}
mov.b32 r2435, {rs97, rs97};
{
mul.f16x2 r2421, r1854, r2435;
}
mov.b32 r2432, {rs98, rs98};
{
mul.f16x2 r2424, r1998, r2432;
}
{
sub.f16x2 r2427, r2421, r2424;
}
{
mul.f16x2 r2430, r1854, r2432;
}
{
fma.rn.f16x2 r2433, r1998, r2435, r2430;
}
mov.b32 r2467, {rs99, rs99};
{
mul.f16x2 r2437, r2166, r2467;
}
mov.b32 r2464, {rs100, rs100};
{
mul.f16x2 r2440, r2310, r2464;
}
{
sub.f16x2 r2443, r2437, r2440;
}
{
mul.f16x2 r2446, r2166, r2464;
}
{
fma.rn.f16x2 r2449, r2310, r2467, r2446;
}
{
mul.f16x2 r2453, r1926, r2467;
}
{
mul.f16x2 r2456, r2070, r2464;
}
{
sub.f16x2 r2459, r2453, r2456;
}
{
mul.f16x2 r2462, r1926, r2464;
}
{
fma.rn.f16x2 r2465, r2070, r2467, r2462;
}
mov.b32 r2531, {rs103, rs103};
{
mul.f16x2 r2469, r2238, r2531;
}
mov.b32 r2528, {rs104, rs104};
{
mul.f16x2 r2472, r2382, r2528;
}
{
sub.f16x2 r2475, r2469, r2472;
}
{
mul.f16x2 r2478, r2238, r2528;
}
{
fma.rn.f16x2 r2481, r2382, r2531, r2478;
}
mov.b32 r2499, {rs101, rs101};
{
mul.f16x2 r2485, r1962, r2499;
}
mov.b32 r2496, {rs102, rs102};
{
mul.f16x2 r2488, r2106, r2496;
}
{
sub.f16x2 r2491, r2485, r2488;
}
{
mul.f16x2 r2494, r1962, r2496;
}
{
fma.rn.f16x2 r2497, r2106, r2499, r2494;
}
mov.b32 r2515, {rs107, rs107};
{
mul.f16x2 r2501, r2274, r2515;
}
mov.b32 r2512, {rs108, rs108};
{
mul.f16x2 r2504, r2418, r2512;
}
{
sub.f16x2 r2507, r2501, r2504;
}
{
mul.f16x2 r2510, r2274, r2512;
}
{
fma.rn.f16x2 r2513, r2418, r2515, r2510;
}
{
mul.f16x2 r2517, r1890, r2531;
}
{
mul.f16x2 r2520, r2034, r2528;
}
{
sub.f16x2 r2523, r2517, r2520;
}
{
mul.f16x2 r2526, r1890, r2528;
}
{
fma.rn.f16x2 r2529, r2034, r2531, r2526;
}
mov.b32 r2547, {rs111, rs111};
{
mul.f16x2 r2533, r2202, r2547;
}
mov.b32 r2544, {rs112, rs112};
{
mul.f16x2 r2536, r2346, r2544;
}
{
sub.f16x2 r2539, r2533, r2536;
}
{
mul.f16x2 r2542, r2202, r2544;
}
{
fma.rn.f16x2 r2545, r2346, r2547, r2542;
}
{
cvt.rn.f16.f64 rs125, fd173;
}
mov.b32 r2620, {rs125, rs125};
{
cvt.rn.f16.f64 rs126, fd172;
}
{
neg.f16 rs127, rs126;
}
mov.b32 r2629, {rs127, rs127};
{
add.f16x2 r2549, r1806, r2118;
}
{
add.f16x2 r2552, r1494, r2549;
}
{
add.f16x2 r2555, r1818, r2130;
}
{
add.f16x2 r2558, r1506, r2555;
}
{
add.f16x2 r2561, r1806, r2118;
}
{
mul.f16x2 r2564, r2561, r2620;
}
{
add.f16x2 r2567, r1494, r2564;
}
{
sub.f16x2 r2570, r1818, r2130;
}
{
mul.f16x2 r2573, r2570, r2629;
}
{
add.f16x2 r2576, r2567, r2573;
}
{
add.f16x2 r2579, r1806, r2118;
}
{
mul.f16x2 r2582, r2579, r2620;
}
{
add.f16x2 r2585, r1494, r2582;
}
{
sub.f16x2 r2588, r1818, r2130;
}
{
mul.f16x2 r2591, r2588, r2629;
}
{
sub.f16x2 r2594, r2585, r2591;
}
{
add.f16x2 r2597, r1818, r2130;
}
{
mul.f16x2 r2600, r2597, r2620;
}
{
add.f16x2 r2603, r1506, r2600;
}
{
sub.f16x2 r2606, r1806, r2118;
}
{
mul.f16x2 r2609, r2606, r2629;
}
{
sub.f16x2 r2612, r2603, r2609;
}
{
add.f16x2 r2615, r1818, r2130;
}
{
mul.f16x2 r2618, r2615, r2620;
}
{
add.f16x2 r2621, r1506, r2618;
}
{
sub.f16x2 r2624, r1806, r2118;
}
{
mul.f16x2 r2627, r2624, r2629;
}
{
add.f16x2 r2630, r2621, r2627;
}
{
cvt.rn.f16.f64 rs129, fd173;
}
mov.b32 r2704, {rs129, rs129};
{
cvt.rn.f16.f64 rs130, fd172;
}
{
neg.f16 rs131, rs130;
}
mov.b32 r2713, {rs131, rs131};
{
add.f16x2 r2633, r2427, r2443;
}
{
add.f16x2 r2636, r1542, r2633;
}
{
add.f16x2 r2639, r2433, r2449;
}
{
add.f16x2 r2642, r1686, r2639;
}
{
add.f16x2 r2645, r2427, r2443;
}
{
mul.f16x2 r2648, r2645, r2704;
}
{
add.f16x2 r2651, r1542, r2648;
}
{
sub.f16x2 r2654, r2433, r2449;
}
{
mul.f16x2 r2657, r2654, r2713;
}
{
add.f16x2 r2660, r2651, r2657;
}
{
add.f16x2 r2663, r2427, r2443;
}
{
mul.f16x2 r2666, r2663, r2704;
}
{
add.f16x2 r2669, r1542, r2666;
}
{
sub.f16x2 r2672, r2433, r2449;
}
{
mul.f16x2 r2675, r2672, r2713;
}
{
sub.f16x2 r2678, r2669, r2675;
}
{
add.f16x2 r2681, r2433, r2449;
}
{
mul.f16x2 r2684, r2681, r2704;
}
{
add.f16x2 r2687, r1686, r2684;
}
{
sub.f16x2 r2690, r2427, r2443;
}
{
mul.f16x2 r2693, r2690, r2713;
}
{
sub.f16x2 r2696, r2687, r2693;
}
{
add.f16x2 r2699, r2433, r2449;
}
{
mul.f16x2 r2702, r2699, r2704;
}
{
add.f16x2 r2705, r1686, r2702;
}
{
sub.f16x2 r2708, r2427, r2443;
}
{
mul.f16x2 r2711, r2708, r2713;
}
{
add.f16x2 r2714, r2705, r2711;
}
{
cvt.rn.f16.f64 rs133, fd173;
}
mov.b32 r2788, {rs133, rs133};
{
cvt.rn.f16.f64 rs134, fd172;
}
{
neg.f16 rs135, rs134;
}
mov.b32 r2797, {rs135, rs135};
{
add.f16x2 r2717, r2459, r2475;
}
{
add.f16x2 r2720, r1614, r2717;
}
{
add.f16x2 r2723, r2465, r2481;
}
{
add.f16x2 r2726, r1758, r2723;
}
{
add.f16x2 r2729, r2459, r2475;
}
{
mul.f16x2 r2732, r2729, r2788;
}
{
add.f16x2 r2735, r1614, r2732;
}
{
sub.f16x2 r2738, r2465, r2481;
}
{
mul.f16x2 r2741, r2738, r2797;
}
{
add.f16x2 r2744, r2735, r2741;
}
{
add.f16x2 r2747, r2459, r2475;
}
{
mul.f16x2 r2750, r2747, r2788;
}
{
add.f16x2 r2753, r1614, r2750;
}
{
sub.f16x2 r2756, r2465, r2481;
}
{
mul.f16x2 r2759, r2756, r2797;
}
{
sub.f16x2 r2762, r2753, r2759;
}
{
add.f16x2 r2765, r2465, r2481;
}
{
mul.f16x2 r2768, r2765, r2788;
}
{
add.f16x2 r2771, r1758, r2768;
}
{
sub.f16x2 r2774, r2459, r2475;
}
{
mul.f16x2 r2777, r2774, r2797;
}
{
sub.f16x2 r2780, r2771, r2777;
}
{
add.f16x2 r2783, r2465, r2481;
}
{
mul.f16x2 r2786, r2783, r2788;
}
{
add.f16x2 r2789, r1758, r2786;
}
{
sub.f16x2 r2792, r2459, r2475;
}
{
mul.f16x2 r2795, r2792, r2797;
}
{
add.f16x2 r2798, r2789, r2795;
}
{
cvt.rn.f16.f64 rs137, fd173;
}
mov.b32 r2872, {rs137, rs137};
{
cvt.rn.f16.f64 rs138, fd172;
}
{
neg.f16 rs139, rs138;
}
mov.b32 r2881, {rs139, rs139};
{
add.f16x2 r2801, r2491, r2507;
}
{
add.f16x2 r2804, r1650, r2801;
}
{
add.f16x2 r2807, r2497, r2513;
}
{
add.f16x2 r2810, r1794, r2807;
}
{
add.f16x2 r2813, r2491, r2507;
}
{
mul.f16x2 r2816, r2813, r2872;
}
{
add.f16x2 r2819, r1650, r2816;
}
{
sub.f16x2 r2822, r2497, r2513;
}
{
mul.f16x2 r2825, r2822, r2881;
}
{
add.f16x2 r2828, r2819, r2825;
}
{
add.f16x2 r2831, r2491, r2507;
}
{
mul.f16x2 r2834, r2831, r2872;
}
{
add.f16x2 r2837, r1650, r2834;
}
{
sub.f16x2 r2840, r2497, r2513;
}
{
mul.f16x2 r2843, r2840, r2881;
}
{
sub.f16x2 r2846, r2837, r2843;
}
{
add.f16x2 r2849, r2497, r2513;
}
{
mul.f16x2 r2852, r2849, r2872;
}
{
add.f16x2 r2855, r1794, r2852;
}
{
sub.f16x2 r2858, r2491, r2507;
}
{
mul.f16x2 r2861, r2858, r2881;
}
{
sub.f16x2 r2864, r2855, r2861;
}
{
add.f16x2 r2867, r2497, r2513;
}
{
mul.f16x2 r2870, r2867, r2872;
}
{
add.f16x2 r2873, r1794, r2870;
}
{
sub.f16x2 r2876, r2491, r2507;
}
{
mul.f16x2 r2879, r2876, r2881;
}
{
add.f16x2 r2882, r2873, r2879;
}
{
cvt.rn.f16.f64 rs141, fd173;
}
mov.b32 r2956, {rs141, rs141};
{
cvt.rn.f16.f64 rs142, fd172;
}
{
neg.f16 rs143, rs142;
}
mov.b32 r2965, {rs143, rs143};
mov.f64 fd171, 0dBFCA9CD9AC4258F6;
{
add.f16x2 r2885, r2523, r2539;
}
{
add.f16x2 r2888, r1578, r2885;
}
{
add.f16x2 r2891, r2529, r2545;
}
{
add.f16x2 r2894, r1722, r2891;
}
{
add.f16x2 r2897, r2523, r2539;
}
{
mul.f16x2 r2900, r2897, r2956;
}
{
add.f16x2 r2903, r1578, r2900;
}
{
sub.f16x2 r2906, r2529, r2545;
}
{
mul.f16x2 r2909, r2906, r2965;
}
{
add.f16x2 r2912, r2903, r2909;
}
{
add.f16x2 r2915, r2523, r2539;
}
{
mul.f16x2 r2918, r2915, r2956;
}
{
add.f16x2 r2921, r1578, r2918;
}
{
sub.f16x2 r2924, r2529, r2545;
}
{
mul.f16x2 r2927, r2924, r2965;
}
{
sub.f16x2 r2930, r2921, r2927;
}
{
add.f16x2 r2933, r2529, r2545;
}
{
mul.f16x2 r2936, r2933, r2956;
}
{
add.f16x2 r2939, r1722, r2936;
}
{
sub.f16x2 r2942, r2523, r2539;
}
{
mul.f16x2 r2945, r2942, r2965;
}
{
sub.f16x2 r2948, r2939, r2945;
}
{
add.f16x2 r2951, r2529, r2545;
}
{
mul.f16x2 r2954, r2951, r2956;
}
{
add.f16x2 r2957, r1722, r2954;
}
{
sub.f16x2 r2960, r2523, r2539;
}
{
mul.f16x2 r2963, r2960, r2965;
}
{
add.f16x2 r2966, r2957, r2963;
}
mov.f64 fd113, 0d3FEF4CFC327A0080;
{
cvt.rn.f16.f64 rs145, fd113;
}
{
cvt.rn.f16.f64 rs146, fd171;
}
{
cvt.rn.f16.f64 rs147, fd115;
}
{
cvt.rn.f16.f64 rs148, fd138;
}
mov.f64 fd117, 0d3FE9E3779B97F4A8;
{
cvt.rn.f16.f64 rs149, fd117;
}
{
cvt.rn.f16.f64 rs150, fd136;
}
{
cvt.rn.f16.f64 rs151, fd119;
}
{
cvt.rn.f16.f64 rs152, fd134;
}
mov.f64 fd121, 0d3FE0000000000000;
{
cvt.rn.f16.f64 rs153, fd121;
}
{
cvt.rn.f16.f64 rs154, fd172;
}
{
cvt.rn.f16.f64 rs155, fd123;
}
{
cvt.rn.f16.f64 rs156, fd130;
}
mov.f64 fd125, 0d3FBAC2609B3C576C;
{
cvt.rn.f16.f64 rs157, fd125;
}
{
cvt.rn.f16.f64 rs158, fd128;
}
{
cvt.rn.f16.f64 rs159, fd127;
}
{
cvt.rn.f16.f64 rs160, fd128;
}
mov.f64 fd129, 0dBFD3C6EF372FE950;
{
cvt.rn.f16.f64 rs161, fd129;
}
{
cvt.rn.f16.f64 rs162, fd130;
}
{
cvt.rn.f16.f64 rs163, fd173;
}
{
cvt.rn.f16.f64 rs164, fd172;
}
mov.f64 fd133, 0dBFE5698496E20BD8;
{
cvt.rn.f16.f64 rs165, fd133;
}
{
cvt.rn.f16.f64 rs166, fd134;
}
{
cvt.rn.f16.f64 rs167, fd135;
}
{
cvt.rn.f16.f64 rs168, fd136;
}
mov.f64 fd137, 0dBFED3BC3AEFF7F95;
{
cvt.rn.f16.f64 rs169, fd137;
}
{
cvt.rn.f16.f64 rs170, fd138;
}
{
cvt.rn.f16.f64 rs171, fd139;
}
{
cvt.rn.f16.f64 rs172, fd171;
}
mov.b32 r2983, {rs145, rs145};
{
mul.f16x2 r2969, r2636, r2983;
}
mov.b32 r2980, {rs146, rs146};
{
mul.f16x2 r2972, r2642, r2980;
}
{
sub.f16x2 r2975, r2969, r2972;
}
{
mul.f16x2 r2978, r2636, r2980;
}
{
fma.rn.f16x2 r2981, r2642, r2983, r2978;
}
mov.b32 r2999, {rs147, rs147};
{
mul.f16x2 r2985, r2720, r2999;
}
mov.b32 r2996, {rs148, rs148};
{
mul.f16x2 r2988, r2726, r2996;
}
{
sub.f16x2 r2991, r2985, r2988;
}
{
mul.f16x2 r2994, r2720, r2996;
}
{
fma.rn.f16x2 r2997, r2726, r2999, r2994;
}
mov.b32 r3015, {rs149, rs149};
{
mul.f16x2 r3001, r2804, r3015;
}
mov.b32 r3012, {rs150, rs150};
{
mul.f16x2 r3004, r2810, r3012;
}
{
sub.f16x2 r3007, r3001, r3004;
}
{
mul.f16x2 r3010, r2804, r3012;
}
{
fma.rn.f16x2 r3013, r2810, r3015, r3010;
}
mov.b32 r3031, {rs151, rs151};
{
mul.f16x2 r3017, r2888, r3031;
}
mov.b32 r3028, {rs152, rs152};
{
mul.f16x2 r3020, r2894, r3028;
}
{
sub.f16x2 r3023, r3017, r3020;
}
{
mul.f16x2 r3026, r2888, r3028;
}
{
fma.rn.f16x2 r3029, r2894, r3031, r3026;
}
mov.b32 r3047, {rs153, rs153};
{
mul.f16x2 r3033, r2576, r3047;
}
mov.b32 r3044, {rs154, rs154};
{
mul.f16x2 r3036, r2612, r3044;
}
{
sub.f16x2 r3039, r3033, r3036;
}
{
mul.f16x2 r3042, r2576, r3044;
}
{
fma.rn.f16x2 r3045, r2612, r3047, r3042;
}
mov.b32 r3063, {rs155, rs155};
{
mul.f16x2 r3049, r2660, r3063;
}
mov.b32 r3060, {rs156, rs156};
{
mul.f16x2 r3052, r2696, r3060;
}
{
sub.f16x2 r3055, r3049, r3052;
}
{
mul.f16x2 r3058, r2660, r3060;
}
{
fma.rn.f16x2 r3061, r2696, r3063, r3058;
}
mov.b32 r3079, {rs157, rs157};
{
mul.f16x2 r3065, r2744, r3079;
}
mov.b32 r3076, {rs158, rs158};
{
mul.f16x2 r3068, r2780, r3076;
}
{
sub.f16x2 r3071, r3065, r3068;
}
{
mul.f16x2 r3074, r2744, r3076;
}
{
fma.rn.f16x2 r3077, r2780, r3079, r3074;
}
mov.b32 r3095, {rs159, rs159};
{
mul.f16x2 r3081, r2828, r3095;
}
mov.b32 r3092, {rs160, rs160};
{
mul.f16x2 r3084, r2864, r3092;
}
{
sub.f16x2 r3087, r3081, r3084;
}
{
mul.f16x2 r3090, r2828, r3092;
}
{
fma.rn.f16x2 r3093, r2864, r3095, r3090;
}
mov.b32 r3111, {rs161, rs161};
{
mul.f16x2 r3097, r2912, r3111;
}
mov.b32 r3108, {rs162, rs162};
{
mul.f16x2 r3100, r2948, r3108;
}
{
sub.f16x2 r3103, r3097, r3100;
}
{
mul.f16x2 r3106, r2912, r3108;
}
{
fma.rn.f16x2 r3109, r2948, r3111, r3106;
}
mov.b32 r3127, {rs163, rs163};
{
mul.f16x2 r3113, r2594, r3127;
}
mov.b32 r3124, {rs164, rs164};
{
mul.f16x2 r3116, r2630, r3124;
}
{
sub.f16x2 r3119, r3113, r3116;
}
{
mul.f16x2 r3122, r2594, r3124;
}
{
fma.rn.f16x2 r3125, r2630, r3127, r3122;
}
mov.b32 r3143, {rs165, rs165};
{
mul.f16x2 r3129, r2678, r3143;
}
mov.b32 r3140, {rs166, rs166};
{
mul.f16x2 r3132, r2714, r3140;
}
{
sub.f16x2 r3135, r3129, r3132;
}
{
mul.f16x2 r3138, r2678, r3140;
}
{
fma.rn.f16x2 r3141, r2714, r3143, r3138;
}
mov.b32 r3159, {rs167, rs167};
{
mul.f16x2 r3145, r2762, r3159;
}
mov.b32 r3156, {rs168, rs168};
{
mul.f16x2 r3148, r2798, r3156;
}
{
sub.f16x2 r3151, r3145, r3148;
}
{
mul.f16x2 r3154, r2762, r3156;
}
{
fma.rn.f16x2 r3157, r2798, r3159, r3154;
}
mov.b32 r3175, {rs169, rs169};
{
mul.f16x2 r3161, r2846, r3175;
}
mov.b32 r3172, {rs170, rs170};
{
mul.f16x2 r3164, r2882, r3172;
}
{
sub.f16x2 r3167, r3161, r3164;
}
{
mul.f16x2 r3170, r2846, r3172;
}
{
fma.rn.f16x2 r3173, r2882, r3175, r3170;
}
mov.b32 r3191, {rs171, rs171};
{
mul.f16x2 r3177, r2930, r3191;
}
mov.b32 r3188, {rs172, rs172};
{
mul.f16x2 r3180, r2966, r3188;
}
{
sub.f16x2 r3183, r3177, r3180;
}
{
mul.f16x2 r3186, r2930, r3188;
}
{
fma.rn.f16x2 r3189, r2966, r3191, r3186;
}
{
add.f16x2 %0, r1068, r2552;
}
{
add.f16x2 %1, r1074, r2558;
}
{
sub.f16x2 %30, r1068, r2552;
}
{
sub.f16x2 %31, r1074, r2558;
}
{
add.f16x2 %2, r1152, r2975;
}
{
add.f16x2 %3, r1158, r2981;
}
{
sub.f16x2 %32, r1152, r2975;
}
{
sub.f16x2 %33, r1158, r2981;
}
{
add.f16x2 %4, r1236, r2991;
}
{
add.f16x2 %5, r1242, r2997;
}
{
sub.f16x2 %34, r1236, r2991;
}
{
sub.f16x2 %35, r1242, r2997;
}
{
add.f16x2 %6, r1320, r3007;
}
{
add.f16x2 %7, r1326, r3013;
}
{
sub.f16x2 %36, r1320, r3007;
}
{
sub.f16x2 %37, r1326, r3013;
}
{
add.f16x2 %8, r1404, r3023;
}
{
add.f16x2 %9, r1410, r3029;
}
{
sub.f16x2 %38, r1404, r3023;
}
{
sub.f16x2 %39, r1410, r3029;
}
{
add.f16x2 %10, r1092, r3039;
}
{
add.f16x2 %11, r1128, r3045;
}
{
sub.f16x2 %40, r1092, r3039;
}
{
sub.f16x2 %41, r1128, r3045;
}
{
add.f16x2 %12, r1176, r3055;
}
{
add.f16x2 %13, r1212, r3061;
}
{
sub.f16x2 %42, r1176, r3055;
}
{
sub.f16x2 %43, r1212, r3061;
}
{
add.f16x2 %14, r1260, r3071;
}
{
add.f16x2 %15, r1296, r3077;
}
{
sub.f16x2 %44, r1260, r3071;
}
{
sub.f16x2 %45, r1296, r3077;
}
{
add.f16x2 %16, r1344, r3087;
}
{
add.f16x2 %17, r1380, r3093;
}
{
sub.f16x2 %46, r1344, r3087;
}
{
sub.f16x2 %47, r1380, r3093;
}
{
add.f16x2 %18, r1428, r3103;
}
{
add.f16x2 %19, r1464, r3109;
}
{
sub.f16x2 %48, r1428, r3103;
}
{
sub.f16x2 %49, r1464, r3109;
}
{
add.f16x2 %20, r1110, r3119;
}
{
add.f16x2 %21, r1146, r3125;
}
{
sub.f16x2 %50, r1110, r3119;
}
{
sub.f16x2 %51, r1146, r3125;
}
{
add.f16x2 %22, r1194, r3135;
}
{
add.f16x2 %23, r1230, r3141;
}
{
sub.f16x2 %52, r1194, r3135;
}
{
sub.f16x2 %53, r1230, r3141;
}
{
add.f16x2 %24, r1278, r3151;
}
{
add.f16x2 %25, r1314, r3157;
}
{
sub.f16x2 %54, r1278, r3151;
}
{
sub.f16x2 %55, r1314, r3157;
}
{
add.f16x2 %26, r1362, r3167;
}
{
add.f16x2 %27, r1398, r3173;
}
{
sub.f16x2 %56, r1362, r3167;
}
{
sub.f16x2 %57, r1398, r3173;
}
{
add.f16x2 %28, r1446, r3183;
}
{
add.f16x2 %29, r1482, r3189;
}
{
sub.f16x2 %58, r1446, r3183;
}
{
sub.f16x2 %59, r1482, r3189;
}
})"
     : "=r"(__HALF2_TO_UI(rmem[0].x)), "=r"(__HALF2_TO_UI(rmem[0].y)), "=r"(__HALF2_TO_UI(rmem[1].x)), "=r"(__HALF2_TO_UI(rmem[1].y)), "=r"(__HALF2_TO_UI(rmem[2].x)), "=r"(__HALF2_TO_UI(rmem[2].y)), "=r"(__HALF2_TO_UI(rmem[3].x)), "=r"(__HALF2_TO_UI(rmem[3].y)), "=r"(__HALF2_TO_UI(rmem[4].x)), "=r"(__HALF2_TO_UI(rmem[4].y)), "=r"(__HALF2_TO_UI(rmem[5].x)), "=r"(__HALF2_TO_UI(rmem[5].y)), "=r"(__HALF2_TO_UI(rmem[6].x)), "=r"(__HALF2_TO_UI(rmem[6].y)), "=r"(__HALF2_TO_UI(rmem[7].x)), "=r"(__HALF2_TO_UI(rmem[7].y)), "=r"(__HALF2_TO_UI(rmem[8].x)), "=r"(__HALF2_TO_UI(rmem[8].y)), "=r"(__HALF2_TO_UI(rmem[9].x)), "=r"(__HALF2_TO_UI(rmem[9].y)), "=r"(__HALF2_TO_UI(rmem[10].x)), "=r"(__HALF2_TO_UI(rmem[10].y)), "=r"(__HALF2_TO_UI(rmem[11].x)), "=r"(__HALF2_TO_UI(rmem[11].y)), "=r"(__HALF2_TO_UI(rmem[12].x)), "=r"(__HALF2_TO_UI(rmem[12].y)), "=r"(__HALF2_TO_UI(rmem[13].x)), "=r"(__HALF2_TO_UI(rmem[13].y)), "=r"(__HALF2_TO_UI(rmem[14].x)), "=r"(__HALF2_TO_UI(rmem[14].y)), "=r"(__HALF2_TO_UI(rmem[15].x)), "=r"(__HALF2_TO_UI(rmem[15].y)), "=r"(__HALF2_TO_UI(rmem[16].x)), "=r"(__HALF2_TO_UI(rmem[16].y)), "=r"(__HALF2_TO_UI(rmem[17].x)), "=r"(__HALF2_TO_UI(rmem[17].y)), "=r"(__HALF2_TO_UI(rmem[18].x)), "=r"(__HALF2_TO_UI(rmem[18].y)), "=r"(__HALF2_TO_UI(rmem[19].x)), "=r"(__HALF2_TO_UI(rmem[19].y)), "=r"(__HALF2_TO_UI(rmem[20].x)), "=r"(__HALF2_TO_UI(rmem[20].y)), "=r"(__HALF2_TO_UI(rmem[21].x)), "=r"(__HALF2_TO_UI(rmem[21].y)), "=r"(__HALF2_TO_UI(rmem[22].x)), "=r"(__HALF2_TO_UI(rmem[22].y)), "=r"(__HALF2_TO_UI(rmem[23].x)), "=r"(__HALF2_TO_UI(rmem[23].y)), "=r"(__HALF2_TO_UI(rmem[24].x)), "=r"(__HALF2_TO_UI(rmem[24].y)), "=r"(__HALF2_TO_UI(rmem[25].x)), "=r"(__HALF2_TO_UI(rmem[25].y)), "=r"(__HALF2_TO_UI(rmem[26].x)), "=r"(__HALF2_TO_UI(rmem[26].y)), "=r"(__HALF2_TO_UI(rmem[27].x)), "=r"(__HALF2_TO_UI(rmem[27].y)), "=r"(__HALF2_TO_UI(rmem[28].x)), "=r"(__HALF2_TO_UI(rmem[28].y)), "=r"(__HALF2_TO_UI(rmem[29].x)), "=r"(__HALF2_TO_UI(rmem[29].y)): "r"(__HALF2_TO_UI(rmem[18].y)), "r"(__HALF2_TO_UI(rmem[6].y)), "r"(__HALF2_TO_UI(rmem[0].y)), "r"(__HALF2_TO_UI(rmem[24].x)), "r"(__HALF2_TO_UI(rmem[12].y)), "r"(__HALF2_TO_UI(rmem[18].x)), "r"(__HALF2_TO_UI(rmem[6].x)), "r"(__HALF2_TO_UI(rmem[0].x)), "r"(__HALF2_TO_UI(rmem[24].y)), "r"(__HALF2_TO_UI(rmem[12].x)), "r"(__HALF2_TO_UI(rmem[2].y)), "r"(__HALF2_TO_UI(rmem[26].x)), "r"(__HALF2_TO_UI(rmem[14].y)), "r"(__HALF2_TO_UI(rmem[20].x)), "r"(__HALF2_TO_UI(rmem[8].x)), "r"(__HALF2_TO_UI(rmem[2].x)), "r"(__HALF2_TO_UI(rmem[26].y)), "r"(__HALF2_TO_UI(rmem[14].x)), "r"(__HALF2_TO_UI(rmem[20].y)), "r"(__HALF2_TO_UI(rmem[8].y)), "r"(__HALF2_TO_UI(rmem[22].x)), "r"(__HALF2_TO_UI(rmem[10].x)), "r"(__HALF2_TO_UI(rmem[4].x)), "r"(__HALF2_TO_UI(rmem[28].y)), "r"(__HALF2_TO_UI(rmem[16].x)), "r"(__HALF2_TO_UI(rmem[22].y)), "r"(__HALF2_TO_UI(rmem[10].y)), "r"(__HALF2_TO_UI(rmem[4].y)), "r"(__HALF2_TO_UI(rmem[28].x)), "r"(__HALF2_TO_UI(rmem[16].y)), "r"(__HALF2_TO_UI(rmem[19].y)), "r"(__HALF2_TO_UI(rmem[7].y)), "r"(__HALF2_TO_UI(rmem[1].y)), "r"(__HALF2_TO_UI(rmem[25].x)), "r"(__HALF2_TO_UI(rmem[13].y)), "r"(__HALF2_TO_UI(rmem[19].x)), "r"(__HALF2_TO_UI(rmem[7].x)), "r"(__HALF2_TO_UI(rmem[1].x)), "r"(__HALF2_TO_UI(rmem[25].y)), "r"(__HALF2_TO_UI(rmem[13].x)), "r"(__HALF2_TO_UI(rmem[3].y)), "r"(__HALF2_TO_UI(rmem[27].x)), "r"(__HALF2_TO_UI(rmem[15].y)), "r"(__HALF2_TO_UI(rmem[9].x)), "r"(__HALF2_TO_UI(rmem[21].x)), "r"(__HALF2_TO_UI(rmem[3].x)), "r"(__HALF2_TO_UI(rmem[27].y)), "r"(__HALF2_TO_UI(rmem[15].x)), "r"(__HALF2_TO_UI(rmem[21].y)), "r"(__HALF2_TO_UI(rmem[9].y)), "r"(__HALF2_TO_UI(rmem[17].y)), "r"(__HALF2_TO_UI(rmem[5].x)), "r"(__HALF2_TO_UI(rmem[23].x)), "r"(__HALF2_TO_UI(rmem[11].x)), "r"(__HALF2_TO_UI(rmem[17].x)), "r"(__HALF2_TO_UI(rmem[29].y)), "r"(__HALF2_TO_UI(rmem[11].y)), "r"(__HALF2_TO_UI(rmem[23].y)), "r"(__HALF2_TO_UI(rmem[5].y)), "r"(__HALF2_TO_UI(rmem[29].x)));
};


#endif
